timewanderer commited on
Commit
a884a25
1 Parent(s): add581a

Training in progress, step 500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:181452760f4889fb1745514a4de50facf35adde53641198d68d40c6fbe42eedd
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db7b0ba484d365a8232c614da6b35c1ca8564e014b51324208c27b61981f817d
3
  size 268290900
run-0/checkpoint-500/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24cbed69717346d4505abce38ecb7db4d97f2f1981fd7e65cde9a68936fb2155
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db7b0ba484d365a8232c614da6b35c1ca8564e014b51324208c27b61981f817d
3
  size 268290900
run-0/checkpoint-500/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6779aff1e85bbb508f31d389d707a8f6c4de7de20d089e13616f934b3a1e8b10
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91a7ce88c184ba71db5dc4fa9fb784f1d4bdb6de5d88f8d28bb6d60f143ead33
3
  size 536643898
run-0/checkpoint-500/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98041bd7cae455426e290a1a0ee683bd5dd30893f7451fec3a464ae8995b17e4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e1264523e958cf7990dc5f42d876cc12129475c4603804cf66868aaf25c2c24
3
  size 1064
run-0/checkpoint-500/trainer_state.json CHANGED
@@ -10,25 +10,25 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.5767741935483871,
14
- "eval_loss": 0.18995507061481476,
15
- "eval_runtime": 5.3293,
16
- "eval_samples_per_second": 581.689,
17
- "eval_steps_per_second": 12.197,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
- "grad_norm": 0.5155988335609436,
23
- "learning_rate": 1.650593990216632e-05,
24
- "loss": 0.3062,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
- "max_steps": 2862,
30
  "num_input_tokens_seen": 0,
31
- "num_train_epochs": 9,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
@@ -46,8 +46,8 @@
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
- "alpha": 0.39616967623231003,
50
- "num_train_epochs": 9,
51
- "temperature": 20
52
  }
53
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6083870967741936,
14
+ "eval_loss": 0.26111724972724915,
15
+ "eval_runtime": 5.07,
16
+ "eval_samples_per_second": 611.445,
17
+ "eval_steps_per_second": 12.821,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
+ "grad_norm": 0.612690269947052,
23
+ "learning_rate": 1.371069182389937e-05,
24
+ "loss": 0.4067,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
+ "max_steps": 1590,
30
  "num_input_tokens_seen": 0,
31
+ "num_train_epochs": 5,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
 
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
+ "alpha": 0.006505868879858823,
50
+ "num_train_epochs": 5,
51
+ "temperature": 4
52
  }
53
  }
run-0/checkpoint-500/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d45fdb811c2d25bdfa6f70464c8f8897df3766bc1abc5d6e057a6e0a40f0dc9f
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffe43401e68c8a3628adf33b38f6ac638a3a3f3bc1dcbe05d52f58aece31629f
3
  size 5240
runs/Oct11_14-59-09_984d9c1bc9e1/events.out.tfevents.1728659192.984d9c1bc9e1.1239.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dc94bd8a43b2c84d03f0e5ac80a3deaf53792d4812204783528a3359f7d10da
3
+ size 12975
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f44d7647a25bb8e1432bec942b7c9fce7cd5c43c5497aaddf8f9e0d9aeee28b
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffe43401e68c8a3628adf33b38f6ac638a3a3f3bc1dcbe05d52f58aece31629f
3
  size 5240