File size: 2,891 Bytes
000db46
d9d123d
 
63d2481
77854d0
63d2481
000db46
 
 
 
 
63d2481
 
 
 
 
 
d9d123d
 
 
63d2481
 
 
 
 
 
000db46
 
 
63d2481
 
 
 
000db46
 
 
63d2481
 
 
 
 
 
77854d0
d9d123d
 
63d2481
 
 
 
 
 
77854d0
d9d123d
 
63d2481
 
 
 
77854d0
d9d123d
 
63d2481
 
 
 
 
 
77854d0
000db46
 
63d2481
 
 
 
 
 
77854d0
d9d123d
000db46
63d2481
 
 
 
 
 
 
000db46
 
d9d123d
63d2481
e461203
dccfed1
77854d0
 
 
 
 
 
 
 
 
 
 
 
 
63d2481
 
000db46
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 2.733485193621868,
  "eval_steps": 200,
  "global_step": 1200,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.45558086560364464,
      "eval_loss": 2.580942392349243,
      "eval_runtime": 191.346,
      "eval_samples_per_second": 36.698,
      "eval_steps_per_second": 0.575,
      "eval_wer": 0.9998405506318181,
      "step": 200
    },
    {
      "epoch": 0.9111617312072893,
      "eval_loss": 0.8878806233406067,
      "eval_runtime": 194.7272,
      "eval_samples_per_second": 36.061,
      "eval_steps_per_second": 0.565,
      "eval_wer": 0.6325356435775124,
      "step": 400
    },
    {
      "epoch": 1.1389521640091116,
      "grad_norm": 0.6171550750732422,
      "learning_rate": 0.0001969444444444444,
      "loss": 2.4327,
      "step": 500
    },
    {
      "epoch": 1.366742596810934,
      "eval_loss": 0.6608928442001343,
      "eval_runtime": 195.9363,
      "eval_samples_per_second": 35.838,
      "eval_steps_per_second": 0.561,
      "eval_wer": 0.4896955845812461,
      "step": 600
    },
    {
      "epoch": 1.8223234624145785,
      "eval_loss": 0.668916642665863,
      "eval_runtime": 191.4141,
      "eval_samples_per_second": 36.685,
      "eval_steps_per_second": 0.575,
      "eval_wer": 0.5018270240104173,
      "step": 800
    },
    {
      "epoch": 2.277904328018223,
      "grad_norm": 5.059937000274658,
      "learning_rate": 5.972222222222221e-05,
      "loss": 0.8178,
      "step": 1000
    },
    {
      "epoch": 2.277904328018223,
      "eval_loss": 0.6796883344650269,
      "eval_runtime": 189.9024,
      "eval_samples_per_second": 36.977,
      "eval_steps_per_second": 0.579,
      "eval_wer": 0.4852044273774565,
      "step": 1000
    },
    {
      "epoch": 2.733485193621868,
      "eval_loss": 0.7008175253868103,
      "eval_runtime": 192.012,
      "eval_samples_per_second": 36.571,
      "eval_steps_per_second": 0.573,
      "eval_wer": 0.4816301040407127,
      "step": 1200
    },
    {
      "epoch": 2.733485193621868,
      "step": 1200,
      "total_flos": 9.105570625839254e+18,
      "train_loss": 1.4870800399780273,
      "train_runtime": 3391.8021,
      "train_samples_per_second": 22.643,
      "train_steps_per_second": 0.354
    }
  ],
  "logging_steps": 500,
  "max_steps": 1200,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 3,
  "save_steps": 500,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": true
      },
      "attributes": {}
    }
  },
  "total_flos": 9.105570625839254e+18,
  "train_batch_size": 64,
  "trial_name": null,
  "trial_params": null
}