k-r-l commited on
Commit
65fe405
1 Parent(s): 99eecbb

Training in progress, step 9, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8398c0e5bddec9eb883e0399f65b755d78d063f3b9ecbe58f175f44f364cc7e9
3
  size 13648432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9591d33d66a228df18f40bf825bff99e72c5c3fdd285bcba0bc42330ed2316a
3
  size 13648432
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35967646370f39bc8adcdeb6bb4be3fa34ef34aa59b57e6a7303e7a39ef1094c
3
  size 7309882
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f044fa49bfb4d2bbfcec57213268099d307fbc95f23e06ec1b2719c4ce4e5ff
3
  size 7309882
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:600149e975d1bacd170387afa159597e660c1a6e94a6b29b69de17c6162d48a4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43add00f7e103ff8ae7c8e9ba6ae78e3693180f4799be0f85468cd77804118b2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.08152866242038216,
5
  "eval_steps": 500,
6
- "global_step": 8,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -151,6 +151,24 @@
151
  "rewards/margins": 0.009154656901955605,
152
  "rewards/rejected": -0.28212225437164307,
153
  "step": 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
154
  }
155
  ],
156
  "logging_steps": 1,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.09171974522292993,
5
  "eval_steps": 500,
6
+ "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
151
  "rewards/margins": 0.009154656901955605,
152
  "rewards/rejected": -0.28212225437164307,
153
  "step": 8
154
+ },
155
+ {
156
+ "epoch": 0.09171974522292993,
157
+ "grad_norm": 1.9783447980880737,
158
+ "learning_rate": 9.693877551020408e-05,
159
+ "log_odds_chosen": 0.05389028042554855,
160
+ "log_odds_ratio": -0.6711492538452148,
161
+ "logits/chosen": -0.5444136261940002,
162
+ "logits/rejected": -0.564105212688446,
163
+ "logps/chosen": -2.688671112060547,
164
+ "logps/rejected": -2.7393460273742676,
165
+ "loss": 3.1182,
166
+ "nll_loss": 3.051093101501465,
167
+ "rewards/accuracies": 0.59375,
168
+ "rewards/chosen": -0.2688670754432678,
169
+ "rewards/margins": 0.005067505408078432,
170
+ "rewards/rejected": -0.27393460273742676,
171
+ "step": 9
172
  }
173
  ],
174
  "logging_steps": 1,