Training in progress, epoch 10
Browse files
log.txt
CHANGED
@@ -116,3 +116,17 @@
|
|
116 |
{'loss': 0.185, 'grad_norm': 16.464384078979492, 'learning_rate': 2.083187492707969e-05, 'epoch': 8.75}
|
117 |
{'loss': 0.1794, 'grad_norm': 20.86390495300293, 'learning_rate': 2.0540193676350487e-05, 'epoch': 8.84}
|
118 |
{'loss': 0.1843, 'grad_norm': 14.848393440246582, 'learning_rate': 2.0248512425621283e-05, 'epoch': 8.93}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
116 |
{'loss': 0.185, 'grad_norm': 16.464384078979492, 'learning_rate': 2.083187492707969e-05, 'epoch': 8.75}
|
117 |
{'loss': 0.1794, 'grad_norm': 20.86390495300293, 'learning_rate': 2.0540193676350487e-05, 'epoch': 8.84}
|
118 |
{'loss': 0.1843, 'grad_norm': 14.848393440246582, 'learning_rate': 2.0248512425621283e-05, 'epoch': 8.93}
|
119 |
+
[1 2 2 ... 0 2 0] [0 0 2 ... 0 1 0]
|
120 |
+
{'eval_loss': 3.4013631343841553, 'eval_accuracy': 0.4159693999521874, 'eval_runtime': 6.5155, 'eval_samples_per_second': 642.004, 'eval_steps_per_second': 20.106, 'epoch': 9.0}
|
121 |
+
{'loss': 0.1752, 'grad_norm': 16.65215301513672, 'learning_rate': 1.995683117489208e-05, 'epoch': 9.01}
|
122 |
+
{'loss': 0.1354, 'grad_norm': 30.883514404296875, 'learning_rate': 1.9665149924162876e-05, 'epoch': 9.1}
|
123 |
+
{'loss': 0.1378, 'grad_norm': 24.399015426635742, 'learning_rate': 1.9373468673433673e-05, 'epoch': 9.19}
|
124 |
+
{'loss': 0.1382, 'grad_norm': 10.105205535888672, 'learning_rate': 1.908178742270447e-05, 'epoch': 9.28}
|
125 |
+
{'loss': 0.1364, 'grad_norm': 17.550519943237305, 'learning_rate': 1.8790106171975266e-05, 'epoch': 9.36}
|
126 |
+
{'loss': 0.1429, 'grad_norm': 14.63619613647461, 'learning_rate': 1.8498424921246062e-05, 'epoch': 9.45}
|
127 |
+
{'loss': 0.1484, 'grad_norm': 20.125774383544922, 'learning_rate': 1.820674367051686e-05, 'epoch': 9.54}
|
128 |
+
{'loss': 0.1447, 'grad_norm': 9.442309379577637, 'learning_rate': 1.7915062419787655e-05, 'epoch': 9.63}
|
129 |
+
{'loss': 0.1441, 'grad_norm': 3.3339831829071045, 'learning_rate': 1.7623381169058455e-05, 'epoch': 9.71}
|
130 |
+
{'loss': 0.1422, 'grad_norm': 12.243080139160156, 'learning_rate': 1.733169991832925e-05, 'epoch': 9.8}
|
131 |
+
{'loss': 0.1515, 'grad_norm': 8.44780158996582, 'learning_rate': 1.7040018667600048e-05, 'epoch': 9.89}
|
132 |
+
{'loss': 0.1478, 'grad_norm': 7.068332672119141, 'learning_rate': 1.6748337416870844e-05, 'epoch': 9.98}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267829484
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac30861de0c27028361f5da5d9a0bd97c4cab21faff9986509bda049d847e6ed
|
3 |
size 267829484
|
runs/Mar14_16-58-52_cehsc-app-001.ad.unlv.edu/events.out.tfevents.1710460734.cehsc-app-001.ad.unlv.edu.4089564.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4d163f603a4a4c14b2029c8b0493aca597b4cf8b89ac9aa411ec6ee1656120f
|
3 |
+
size 32227
|