k-r-l commited on
Commit
43d8e3c
1 Parent(s): 532829f

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9591d33d66a228df18f40bf825bff99e72c5c3fdd285bcba0bc42330ed2316a
3
  size 13648432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe2e764601139447b09b1940cad4fcd131d157b3e2784066a3141e9bfbdee2e4
3
  size 13648432
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f044fa49bfb4d2bbfcec57213268099d307fbc95f23e06ec1b2719c4ce4e5ff
3
  size 7309882
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cd62999c0283cf985daa9ac4c15a5bad20101c134a614f464395a815e2f477f
3
  size 7309882
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43add00f7e103ff8ae7c8e9ba6ae78e3693180f4799be0f85468cd77804118b2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a02099495f1ee0f69345f2400d62a00da3dfa60ed976e72211dd9b267ea7c6f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.09171974522292993,
5
  "eval_steps": 500,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -169,6 +169,24 @@
169
  "rewards/margins": 0.005067505408078432,
170
  "rewards/rejected": -0.27393460273742676,
171
  "step": 9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
172
  }
173
  ],
174
  "logging_steps": 1,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.10191082802547771,
5
  "eval_steps": 500,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
169
  "rewards/margins": 0.005067505408078432,
170
  "rewards/rejected": -0.27393460273742676,
171
  "step": 9
172
+ },
173
+ {
174
+ "epoch": 0.10191082802547771,
175
+ "grad_norm": 3.7560782432556152,
176
+ "learning_rate": 9.659863945578231e-05,
177
+ "log_odds_chosen": 0.05389935150742531,
178
+ "log_odds_ratio": -0.6712656617164612,
179
+ "logits/chosen": -0.5685052871704102,
180
+ "logits/rejected": -0.5835959911346436,
181
+ "logps/chosen": -2.7232255935668945,
182
+ "logps/rejected": -2.772873878479004,
183
+ "loss": 3.1185,
184
+ "nll_loss": 3.0513598918914795,
185
+ "rewards/accuracies": 0.65625,
186
+ "rewards/chosen": -0.27232253551483154,
187
+ "rewards/margins": 0.004964826162904501,
188
+ "rewards/rejected": -0.27728739380836487,
189
+ "step": 10
190
  }
191
  ],
192
  "logging_steps": 1,