Training in progress, epoch 14
Browse files
log.txt
CHANGED
@@ -170,3 +170,16 @@
|
|
170 |
{'loss': 0.0889, 'grad_norm': 32.98908996582031, 'learning_rate': 7.414537393536344e-06, 'epoch': 12.78}
|
171 |
{'loss': 0.0837, 'grad_norm': 0.6928532719612122, 'learning_rate': 7.1228561428071415e-06, 'epoch': 12.86}
|
172 |
{'loss': 0.0897, 'grad_norm': 26.65106773376465, 'learning_rate': 6.831174892077938e-06, 'epoch': 12.95}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
170 |
{'loss': 0.0889, 'grad_norm': 32.98908996582031, 'learning_rate': 7.414537393536344e-06, 'epoch': 12.78}
|
171 |
{'loss': 0.0837, 'grad_norm': 0.6928532719612122, 'learning_rate': 7.1228561428071415e-06, 'epoch': 12.86}
|
172 |
{'loss': 0.0897, 'grad_norm': 26.65106773376465, 'learning_rate': 6.831174892077938e-06, 'epoch': 12.95}
|
173 |
+
[2 2 2 ... 0 2 0] [0 0 2 ... 0 1 0]
|
174 |
+
{'eval_loss': 4.996224403381348, 'eval_accuracy': 0.41859909156108055, 'eval_runtime': 6.3438, 'eval_samples_per_second': 659.384, 'eval_steps_per_second': 20.65, 'epoch': 13.0}
|
175 |
+
{'loss': 0.0757, 'grad_norm': 3.703233242034912, 'learning_rate': 6.539493641348734e-06, 'epoch': 13.04}
|
176 |
+
{'loss': 0.0704, 'grad_norm': 0.7255619764328003, 'learning_rate': 6.247812390619531e-06, 'epoch': 13.13}
|
177 |
+
{'loss': 0.0768, 'grad_norm': 21.543807983398438, 'learning_rate': 5.956131139890328e-06, 'epoch': 13.21}
|
178 |
+
{'loss': 0.0742, 'grad_norm': 22.987957000732422, 'learning_rate': 5.664449889161125e-06, 'epoch': 13.3}
|
179 |
+
{'loss': 0.0838, 'grad_norm': 9.414430618286133, 'learning_rate': 5.372768638431922e-06, 'epoch': 13.39}
|
180 |
+
{'loss': 0.0762, 'grad_norm': 16.92205047607422, 'learning_rate': 5.0810873877027185e-06, 'epoch': 13.48}
|
181 |
+
{'loss': 0.0751, 'grad_norm': 16.747333526611328, 'learning_rate': 4.789406136973516e-06, 'epoch': 13.56}
|
182 |
+
{'loss': 0.0784, 'grad_norm': 4.207192420959473, 'learning_rate': 4.497724886244312e-06, 'epoch': 13.65}
|
183 |
+
{'loss': 0.0704, 'grad_norm': 6.768477916717529, 'learning_rate': 4.206043635515109e-06, 'epoch': 13.74}
|
184 |
+
{'loss': 0.0711, 'grad_norm': 10.230005264282227, 'learning_rate': 3.914362384785906e-06, 'epoch': 13.83}
|
185 |
+
{'loss': 0.0823, 'grad_norm': 0.6493052244186401, 'learning_rate': 3.6226811340567034e-06, 'epoch': 13.91}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267829484
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7de8fcb517432e324d4b232b48404ea2e16c07751a2008925cb18c2aae68c828
|
3 |
size 267829484
|
runs/Mar14_16-58-52_cehsc-app-001.ad.unlv.edu/events.out.tfevents.1710460734.cehsc-app-001.ad.unlv.edu.4089564.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81830bf38b69fa646374d7f917cb0ad7d637df5ce0d1752b02acb0ef8336b82c
|
3 |
+
size 43433
|