devvanshhh commited on
Commit
b79d5e9
1 Parent(s): 4fa00d7

Training in progress, step 325, checkpoint

Browse files
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5107c1e3e4f20ae2d01a00b3177144426b219e54afd7614b9d02e74c2f3ab6c
3
  size 369214349
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a20f14db164c17692212d5858de370ffc0ef9edfed58656c48949e0451fad852
3
  size 369214349
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e782e84e692f02fbda556cdbd0b56b2a3476ed6be137830fbce02e8d2ddd8f0
3
  size 369142184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e351d9c62d6220a627e18e224ca4abddc55e39d1617fd6e7ba21c0ebf62ce8e
3
  size 369142184
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c958eb1a8503f4eae4085bedb0c3056eb4754c9d3f629842f1aaa1c94f086b2e
3
  size 738393861
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1c1bdf4f98adae7838dbe4cb68bdeae77e4323f5c379cb612dd480aaafe7f67
3
  size 738393861
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:862164832507ca0755143b19a96acb896b1f394e94065e94a7857cbe9c8453dc
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c9dd26c37219b5c1bddc661447d8b58d02fabacf2155bbc4c46e2ef98d15e5a
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3e02e4b8a74e841ee5a1ce8c453a9becb15f5be6cbcdd100b814e93235dab36
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:840e24cad9f717e9dc7387ea92e5c63c97ae1fbdfb0704ed051dd9f95a2737bb
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.41208791208791207,
5
  "eval_steps": 500,
6
- "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -79,13 +79,19 @@
79
  "learning_rate": 0.0002,
80
  "loss": 0.7793,
81
  "step": 300
 
 
 
 
 
 
82
  }
83
  ],
84
  "logging_steps": 25,
85
  "max_steps": 728,
86
  "num_train_epochs": 1,
87
  "save_steps": 25,
88
- "total_flos": 2899555803168768.0,
89
  "trial_name": null,
90
  "trial_params": null
91
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.44642857142857145,
5
  "eval_steps": 500,
6
+ "global_step": 325,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
79
  "learning_rate": 0.0002,
80
  "loss": 0.7793,
81
  "step": 300
82
+ },
83
+ {
84
+ "epoch": 0.45,
85
+ "learning_rate": 0.0002,
86
+ "loss": 1.0234,
87
+ "step": 325
88
  }
89
  ],
90
  "logging_steps": 25,
91
  "max_steps": 728,
92
  "num_train_epochs": 1,
93
  "save_steps": 25,
94
+ "total_flos": 3200350359748608.0,
95
  "trial_name": null,
96
  "trial_params": null
97
  }