mkopecki commited on
Commit
6bbb597
1 Parent(s): 12c807e

End of training

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:853b3e25a4f56a4058e2078c5744e4f1921ae8c9ef88fca3ca29050b836218f6
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7796a8b8b48c8a65dd69eaa720ca767ce8793f9c21b27bee282ae5a9c1fd9103
3
  size 167832240
runs/Jul14_14-59-55_ml-cluster/events.out.tfevents.1720969199.ml-cluster CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f4be315bf2ecfce060091693340341a56f61b00183d03eb0162c1fa7c6c9d94
3
- size 5702
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acc2a729553151c5f4b3d68429955e6d2be2f98470663adfcc4d2397c395885b
3
+ size 6267
trainer_state.json CHANGED
@@ -10,19 +10,19 @@
10
  "log_history": [
11
  {
12
  "epoch": 2.9940119760479043,
13
- "grad_norm": 2.417518377304077,
14
  "learning_rate": 9.98003992015968e-08,
15
- "loss": 0.9995,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 3.0,
20
  "step": 501,
21
- "total_flos": 2.0033559725080576e+16,
22
- "train_loss": 0.9991578065944527,
23
- "train_runtime": 874.8982,
24
- "train_samples_per_second": 2.287,
25
- "train_steps_per_second": 0.573
26
  }
27
  ],
28
  "logging_steps": 500,
@@ -42,7 +42,7 @@
42
  "attributes": {}
43
  }
44
  },
45
- "total_flos": 2.0033559725080576e+16,
46
  "train_batch_size": 1,
47
  "trial_name": null,
48
  "trial_params": null
 
10
  "log_history": [
11
  {
12
  "epoch": 2.9940119760479043,
13
+ "grad_norm": 2.0207631587982178,
14
  "learning_rate": 9.98003992015968e-08,
15
+ "loss": 0.9071,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 3.0,
20
  "step": 501,
21
+ "total_flos": 2.157617842277581e+16,
22
+ "train_loss": 0.9067429488528512,
23
+ "train_runtime": 916.1317,
24
+ "train_samples_per_second": 2.184,
25
+ "train_steps_per_second": 0.547
26
  }
27
  ],
28
  "logging_steps": 500,
 
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 2.157617842277581e+16,
46
  "train_batch_size": 1,
47
  "trial_name": null,
48
  "trial_params": null