daze-unlv commited on
Commit
f66a776
1 Parent(s): 9931ef2

Training in progress, epoch 14

Browse files
log.txt CHANGED
@@ -170,3 +170,16 @@
170
  {'loss': 0.0889, 'grad_norm': 32.98908996582031, 'learning_rate': 7.414537393536344e-06, 'epoch': 12.78}
171
  {'loss': 0.0837, 'grad_norm': 0.6928532719612122, 'learning_rate': 7.1228561428071415e-06, 'epoch': 12.86}
172
  {'loss': 0.0897, 'grad_norm': 26.65106773376465, 'learning_rate': 6.831174892077938e-06, 'epoch': 12.95}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  {'loss': 0.0889, 'grad_norm': 32.98908996582031, 'learning_rate': 7.414537393536344e-06, 'epoch': 12.78}
171
  {'loss': 0.0837, 'grad_norm': 0.6928532719612122, 'learning_rate': 7.1228561428071415e-06, 'epoch': 12.86}
172
  {'loss': 0.0897, 'grad_norm': 26.65106773376465, 'learning_rate': 6.831174892077938e-06, 'epoch': 12.95}
173
+ [2 2 2 ... 0 2 0] [0 0 2 ... 0 1 0]
174
+ {'eval_loss': 4.996224403381348, 'eval_accuracy': 0.41859909156108055, 'eval_runtime': 6.3438, 'eval_samples_per_second': 659.384, 'eval_steps_per_second': 20.65, 'epoch': 13.0}
175
+ {'loss': 0.0757, 'grad_norm': 3.703233242034912, 'learning_rate': 6.539493641348734e-06, 'epoch': 13.04}
176
+ {'loss': 0.0704, 'grad_norm': 0.7255619764328003, 'learning_rate': 6.247812390619531e-06, 'epoch': 13.13}
177
+ {'loss': 0.0768, 'grad_norm': 21.543807983398438, 'learning_rate': 5.956131139890328e-06, 'epoch': 13.21}
178
+ {'loss': 0.0742, 'grad_norm': 22.987957000732422, 'learning_rate': 5.664449889161125e-06, 'epoch': 13.3}
179
+ {'loss': 0.0838, 'grad_norm': 9.414430618286133, 'learning_rate': 5.372768638431922e-06, 'epoch': 13.39}
180
+ {'loss': 0.0762, 'grad_norm': 16.92205047607422, 'learning_rate': 5.0810873877027185e-06, 'epoch': 13.48}
181
+ {'loss': 0.0751, 'grad_norm': 16.747333526611328, 'learning_rate': 4.789406136973516e-06, 'epoch': 13.56}
182
+ {'loss': 0.0784, 'grad_norm': 4.207192420959473, 'learning_rate': 4.497724886244312e-06, 'epoch': 13.65}
183
+ {'loss': 0.0704, 'grad_norm': 6.768477916717529, 'learning_rate': 4.206043635515109e-06, 'epoch': 13.74}
184
+ {'loss': 0.0711, 'grad_norm': 10.230005264282227, 'learning_rate': 3.914362384785906e-06, 'epoch': 13.83}
185
+ {'loss': 0.0823, 'grad_norm': 0.6493052244186401, 'learning_rate': 3.6226811340567034e-06, 'epoch': 13.91}
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f255ef9e96b68d315888f1664a94af59595316c1367181d81a21b8ed782e5c8
3
  size 267829484
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7de8fcb517432e324d4b232b48404ea2e16c07751a2008925cb18c2aae68c828
3
  size 267829484
runs/Mar14_16-58-52_cehsc-app-001.ad.unlv.edu/events.out.tfevents.1710460734.cehsc-app-001.ad.unlv.edu.4089564.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a495dd63df50de05aca5a3a97ec3d021a676894722d9d297d68ef91dc6a9a2b
3
- size 40524
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81830bf38b69fa646374d7f917cb0ad7d637df5ce0d1752b02acb0ef8336b82c
3
+ size 43433