File size: 1,695 Bytes
1da9e2f
35b1422
1da9e2f
35b1422
1da9e2f
 
 
 
 
 
 
35b1422
1da9e2f
35b1422
1da9e2f
 
 
35b1422
1da9e2f
35b1422
1da9e2f
 
 
35b1422
 
 
 
 
 
1da9e2f
 
 
35b1422
1da9e2f
35b1422
1da9e2f
 
 
35b1422
 
 
 
 
 
1da9e2f
 
 
35b1422
1da9e2f
35b1422
1da9e2f
 
 
35b1422
 
 
 
 
 
1da9e2f
 
 
 
 
35b1422
1da9e2f
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
{
  "best_metric": 1.127414345741272,
  "best_model_checkpoint": "/kaggle/output/checkpoint-3000",
  "epoch": 0.12222946544980444,
  "eval_steps": 1000,
  "global_step": 3000,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0,
      "learning_rate": 2.7777777777777777e-11,
      "loss": 1.029,
      "step": 1
    },
    {
      "epoch": 0.04,
      "learning_rate": 2.7638888888888893e-08,
      "loss": 1.181,
      "step": 1000
    },
    {
      "epoch": 0.04,
      "eval_accuracy": 0.3273453093812375,
      "eval_loss": 1.1529844999313354,
      "eval_runtime": 54.2837,
      "eval_samples_per_second": 92.293,
      "eval_steps_per_second": 11.55,
      "step": 1000
    },
    {
      "epoch": 0.08,
      "learning_rate": 5.541666666666667e-08,
      "loss": 1.1527,
      "step": 2000
    },
    {
      "epoch": 0.08,
      "eval_accuracy": 0.33013972055888224,
      "eval_loss": 1.1351025104522705,
      "eval_runtime": 54.0518,
      "eval_samples_per_second": 92.689,
      "eval_steps_per_second": 11.6,
      "step": 2000
    },
    {
      "epoch": 0.12,
      "learning_rate": 8.316666666666666e-08,
      "loss": 1.142,
      "step": 3000
    },
    {
      "epoch": 0.12,
      "eval_accuracy": 0.3317365269461078,
      "eval_loss": 1.127414345741272,
      "eval_runtime": 54.0871,
      "eval_samples_per_second": 92.628,
      "eval_steps_per_second": 11.592,
      "step": 3000
    }
  ],
  "logging_steps": 1000,
  "max_steps": 10000000,
  "num_train_epochs": 408,
  "save_steps": 1000,
  "total_flos": 6271065391104000.0,
  "trial_name": null,
  "trial_params": null
}