k-r-l commited on
Commit
4bfdd8f
1 Parent(s): a37d263

Training in progress, step 11, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe2e764601139447b09b1940cad4fcd131d157b3e2784066a3141e9bfbdee2e4
3
  size 13648432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd5001970a94c1aeb2be404f63b934153c6a8afecd421ffb89f6ae43dfb02029
3
  size 13648432
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cd62999c0283cf985daa9ac4c15a5bad20101c134a614f464395a815e2f477f
3
  size 7309882
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b961d010e7b252944302920bab7291331927a0492c9deec402fe522402693a0c
3
  size 7309882
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a02099495f1ee0f69345f2400d62a00da3dfa60ed976e72211dd9b267ea7c6f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e23ccafad489da96357ee6455b0c6b7c38f2cddbd7f8464d5fb60ce0c29726cc
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.10191082802547771,
5
  "eval_steps": 500,
6
- "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -187,6 +187,24 @@
187
  "rewards/margins": 0.004964826162904501,
188
  "rewards/rejected": -0.27728739380836487,
189
  "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
190
  }
191
  ],
192
  "logging_steps": 1,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.11210191082802548,
5
  "eval_steps": 500,
6
+ "global_step": 11,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
187
  "rewards/margins": 0.004964826162904501,
188
  "rewards/rejected": -0.27728739380836487,
189
  "step": 10
190
+ },
191
+ {
192
+ "epoch": 0.11210191082802548,
193
+ "grad_norm": 2.745220422744751,
194
+ "learning_rate": 9.625850340136054e-05,
195
+ "log_odds_chosen": 0.0562276728451252,
196
+ "log_odds_ratio": -0.6704986095428467,
197
+ "logits/chosen": -0.5921126008033752,
198
+ "logits/rejected": -0.5893128514289856,
199
+ "logps/chosen": -2.645206928253174,
200
+ "logps/rejected": -2.696500539779663,
201
+ "loss": 3.0034,
202
+ "nll_loss": 2.936365842819214,
203
+ "rewards/accuracies": 0.65625,
204
+ "rewards/chosen": -0.26452070474624634,
205
+ "rewards/margins": 0.005129385739564896,
206
+ "rewards/rejected": -0.26965007185935974,
207
+ "step": 11
208
  }
209
  ],
210
  "logging_steps": 1,