k-r-l commited on
Commit
6985bbc
1 Parent(s): aefddb8

Training in progress, step 5, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2964054f1ce3e570a5a5925bda48122ddbb54f44b42b96aedd7cdbdff7c2ac52
3
  size 13648432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f903071cb570bd7851966ec6fec44995d89982155ffda29cdb6967725c304a7d
3
  size 13648432
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6ba377c6ceb87dee6a4489a116fa7c780de61cb21f836c5d771a22552c4b568
3
  size 6979130
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45b69b38f30c9123191de0b8828377ed369b0f837f3773e9ff0d96384f02ce82
3
  size 6979130
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:132d841d6075a4630b10f974a8eec92787f412f6496d65f09d0ed31599e2fe94
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a97cec4ccaf7b86834a2fdb06e10135db381a62fd0dc050dc49420427220909
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.04076433121019108,
5
  "eval_steps": 500,
6
- "global_step": 4,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -79,6 +79,24 @@
79
  "rewards/margins": 0.011471111327409744,
80
  "rewards/rejected": -0.2936646640300751,
81
  "step": 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
82
  }
83
  ],
84
  "logging_steps": 1,
@@ -93,7 +111,7 @@
93
  "should_evaluate": false,
94
  "should_log": false,
95
  "should_save": true,
96
- "should_training_stop": false
97
  },
98
  "attributes": {}
99
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.050955414012738856,
5
  "eval_steps": 500,
6
+ "global_step": 5,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
79
  "rewards/margins": 0.011471111327409744,
80
  "rewards/rejected": -0.2936646640300751,
81
  "step": 4
82
+ },
83
+ {
84
+ "epoch": 0.050955414012738856,
85
+ "grad_norm": 2.1892218589782715,
86
+ "learning_rate": 0.0,
87
+ "log_odds_chosen": 0.06512074917554855,
88
+ "log_odds_ratio": -0.6671069860458374,
89
+ "logits/chosen": -0.5229994654655457,
90
+ "logits/rejected": -0.5436381697654724,
91
+ "logps/chosen": -2.7552542686462402,
92
+ "logps/rejected": -2.816582679748535,
93
+ "loss": 3.2584,
94
+ "nll_loss": 3.191640615463257,
95
+ "rewards/accuracies": 0.625,
96
+ "rewards/chosen": -0.27552542090415955,
97
+ "rewards/margins": 0.006132860202342272,
98
+ "rewards/rejected": -0.2816582918167114,
99
+ "step": 5
100
  }
101
  ],
102
  "logging_steps": 1,
 
111
  "should_evaluate": false,
112
  "should_log": false,
113
  "should_save": true,
114
+ "should_training_stop": true
115
  },
116
  "attributes": {}
117
  }