k-r-l commited on
Commit
e29c17d
1 Parent(s): b8b20f6

Training in progress, step 6, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45b69b38f30c9123191de0b8828377ed369b0f837f3773e9ff0d96384f02ce82
3
- size 6979130
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9e53fe451017a13010594dadfb5397d4346a7e0c68a800e93e1755de161d87a
3
+ size 7309882
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a97cec4ccaf7b86834a2fdb06e10135db381a62fd0dc050dc49420427220909
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a34833b1148ea746b3aaefd6499b7286814fc0502accf3a99066160145f0cf2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.050955414012738856,
5
  "eval_steps": 500,
6
- "global_step": 5,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -97,12 +97,30 @@
97
  "rewards/margins": 0.006132860202342272,
98
  "rewards/rejected": -0.2816582918167114,
99
  "step": 5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
100
  }
101
  ],
102
  "logging_steps": 1,
103
- "max_steps": 5,
104
  "num_input_tokens_seen": 0,
105
- "num_train_epochs": 1,
106
  "save_steps": 1,
107
  "stateful_callbacks": {
108
  "TrainerControl": {
@@ -111,7 +129,7 @@
111
  "should_evaluate": false,
112
  "should_log": false,
113
  "should_save": true,
114
- "should_training_stop": true
115
  },
116
  "attributes": {}
117
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.061146496815286625,
5
  "eval_steps": 500,
6
+ "global_step": 6,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
97
  "rewards/margins": 0.006132860202342272,
98
  "rewards/rejected": -0.2816582918167114,
99
  "step": 5
100
+ },
101
+ {
102
+ "epoch": 0.061146496815286625,
103
+ "grad_norm": 1.755154013633728,
104
+ "learning_rate": 9.79591836734694e-05,
105
+ "log_odds_chosen": 0.09281320869922638,
106
+ "log_odds_ratio": -0.6549628973007202,
107
+ "logits/chosen": -0.5153884291648865,
108
+ "logits/rejected": -0.5407605767250061,
109
+ "logps/chosen": -2.8005495071411133,
110
+ "logps/rejected": -2.8862051963806152,
111
+ "loss": 3.2371,
112
+ "nll_loss": 3.171649217605591,
113
+ "rewards/accuracies": 0.625,
114
+ "rewards/chosen": -0.2800549566745758,
115
+ "rewards/margins": 0.008565555326640606,
116
+ "rewards/rejected": -0.2886205315589905,
117
+ "step": 6
118
  }
119
  ],
120
  "logging_steps": 1,
121
+ "max_steps": 294,
122
  "num_input_tokens_seen": 0,
123
+ "num_train_epochs": 3,
124
  "save_steps": 1,
125
  "stateful_callbacks": {
126
  "TrainerControl": {
 
129
  "should_evaluate": false,
130
  "should_log": false,
131
  "should_save": true,
132
+ "should_training_stop": false
133
  },
134
  "attributes": {}
135
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17dece46f2086166fcf5d15834c0696840efd4c8cdeff75c12fb5279c16e0afe
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ee18ea0c5cd8ab4dc26bcfd2b5da8b145de03666713371dc25009f17b330bef
3
  size 5560