timewanderer commited on
Commit
58a724e
1 Parent(s): e13f163

Training in progress, step 500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b33a2a62d28195b19d499e7488708c875b8b4a2f93577e25e2b236442f40b382
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cffdaf73e0b6a284c8442673d7ba025740d7309ed5dfb3d7ac54c473816a869a
3
  size 268290900
run-4/checkpoint-500/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d272d8ae2148cfa753bece5873f4a422d8b62dbf9579f13ddb7713129eb2f09e
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cffdaf73e0b6a284c8442673d7ba025740d7309ed5dfb3d7ac54c473816a869a
3
  size 268290900
run-4/checkpoint-500/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64159136088906be185337159e8ab13fe0e786490d680522a0372b2be061dd3c
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb284d6406695d9c68ff21422fe32da7603f4d1b5919d5a7f09a05ec0ea28dd3
3
  size 536643898
run-4/checkpoint-500/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98041bd7cae455426e290a1a0ee683bd5dd30893f7451fec3a464ae8995b17e4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e1264523e958cf7990dc5f42d876cc12129475c4603804cf66868aaf25c2c24
3
  size 1064
run-4/checkpoint-500/trainer_state.json CHANGED
@@ -10,25 +10,25 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.5812903225806452,
14
- "eval_loss": 0.19345349073410034,
15
- "eval_runtime": 5.6622,
16
- "eval_samples_per_second": 547.491,
17
- "eval_steps_per_second": 11.48,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
- "grad_norm": 0.5203747153282166,
23
- "learning_rate": 1.650593990216632e-05,
24
- "loss": 0.3117,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
- "max_steps": 2862,
30
  "num_input_tokens_seen": 0,
31
- "num_train_epochs": 9,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
@@ -46,8 +46,8 @@
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
- "alpha": 0.7805733466574912,
50
- "num_train_epochs": 9,
51
- "temperature": 15
52
  }
53
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6325806451612903,
14
+ "eval_loss": 0.3024460971355438,
15
+ "eval_runtime": 5.4182,
16
+ "eval_samples_per_second": 572.151,
17
+ "eval_steps_per_second": 11.997,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
+ "grad_norm": 0.6661854386329651,
23
+ "learning_rate": 1.371069182389937e-05,
24
+ "loss": 0.4696,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
+ "max_steps": 1590,
30
  "num_input_tokens_seen": 0,
31
+ "num_train_epochs": 5,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
 
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
+ "alpha": 0.41539799624272716,
50
+ "num_train_epochs": 5,
51
+ "temperature": 3
52
  }
53
  }
run-4/checkpoint-500/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:144c14751c6724502091771d5dc8c2ea86a626bf83ae992161b671e93528c094
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42fcda7114a3cb0f210fff0e0a799f161a86990fe91444d8130cb28445b06005
3
  size 5240
runs/Oct12_05-09-37_f46fcd247c16/events.out.tfevents.1728712315.f46fcd247c16.522.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2495a9b1b9e460f45d10d4d35c9c67a3963871dbe8b3486db5500db96a503ef4
3
+ size 13832
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ef5b259539127ef5ddc697d31b7e7180caca610f845f70ff2cba869a6149cf5
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42fcda7114a3cb0f210fff0e0a799f161a86990fe91444d8130cb28445b06005
3
  size 5240