jun-han commited on
Commit
d25b49f
1 Parent(s): fe12c4c

Training checkpoint

Browse files
Files changed (2) hide show
  1. README.md +8 -4
  2. trainer_state.json +82 -36
README.md CHANGED
@@ -1,19 +1,23 @@
1
  ---
 
 
2
  license: apache-2.0
3
- base_model: jun-han/whisper-small-zh_chinese
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
- - name: whisper-small-zh_chinese
8
  results: []
9
  ---
10
 
11
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
12
  should probably proofread and complete it, then remove this comment. -->
13
 
14
- # whisper-small-zh_chinese
15
 
16
- This model is a fine-tuned version of [jun-han/whisper-small-zh_chinese](https://huggingface.co/jun-han/whisper-small-zh_chinese) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
  - Loss: 4.0346
19
  - Cer: 736.0397
 
1
  ---
2
+ language:
3
+ - zh
4
  license: apache-2.0
5
+ base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - Voice_Data_Collection
10
  model-index:
11
+ - name: Whisper-Keep-train
12
  results: []
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
+ # Whisper-Keep-train
19
 
20
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Voice_Data_Collection dataset.
21
  It achieves the following results on the evaluation set:
22
  - Loss: 4.0346
23
  - Cer: 736.0397
trainer_state.json CHANGED
@@ -1,73 +1,119 @@
1
  {
2
- "best_metric": 96.97789806044203,
3
- "best_model_checkpoint": "/kaggle/working/whisper-small-zh_chinese/checkpoint-50",
4
- "epoch": 1.6129032258064515,
5
  "eval_steps": 50,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.4032258064516129,
13
- "grad_norm": 43.397666931152344,
14
- "learning_rate": 4.000000000000001e-06,
15
- "loss": 11.8023,
16
  "step": 25
17
  },
18
  {
19
  "epoch": 0.8064516129032258,
20
- "grad_norm": 18.771446228027344,
21
- "learning_rate": 9e-06,
22
- "loss": 6.4546,
23
  "step": 50
24
  },
25
  {
26
  "epoch": 0.8064516129032258,
27
- "eval_cer": 96.97789806044203,
28
- "eval_loss": 5.9649481773376465,
29
- "eval_runtime": 49.0271,
30
- "eval_samples_per_second": 2.04,
31
- "eval_steps_per_second": 0.265,
32
  "step": 50
33
  },
34
  {
35
  "epoch": 1.2096774193548387,
36
- "grad_norm": 19.21599006652832,
37
- "learning_rate": 6e-06,
38
- "loss": 5.0872,
39
  "step": 75
40
  },
41
  {
42
  "epoch": 1.6129032258064515,
43
- "grad_norm": 18.573108673095703,
44
- "learning_rate": 1.0000000000000002e-06,
45
- "loss": 4.3235,
46
  "step": 100
47
  },
48
  {
49
  "epoch": 1.6129032258064515,
50
- "eval_cer": 283.2656743346865,
51
- "eval_loss": 4.595037460327148,
52
- "eval_runtime": 105.134,
53
- "eval_samples_per_second": 0.951,
54
- "eval_steps_per_second": 0.124,
55
  "step": 100
56
  },
57
  {
58
- "epoch": 1.6129032258064515,
59
- "step": 100,
60
- "total_flos": 6.436739948544e+17,
61
- "train_loss": 6.916923751831055,
62
- "train_runtime": 1054.0975,
63
- "train_samples_per_second": 1.518,
64
- "train_steps_per_second": 0.095
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  }
66
  ],
67
  "logging_steps": 25,
68
- "max_steps": 100,
69
  "num_input_tokens_seen": 0,
70
- "num_train_epochs": 2,
71
  "save_steps": 50,
72
  "stateful_callbacks": {
73
  "TrainerControl": {
@@ -81,7 +127,7 @@
81
  "attributes": {}
82
  }
83
  },
84
- "total_flos": 6.436739948544e+17,
85
  "train_batch_size": 16,
86
  "trial_name": null,
87
  "trial_params": null
 
1
  {
2
+ "best_metric": 265.17816869643667,
3
+ "best_model_checkpoint": "/kaggle/working/whisper-small-zh_chinese/checkpoint-100",
4
+ "epoch": 3.225806451612903,
5
  "eval_steps": 50,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.4032258064516129,
13
+ "grad_norm": 21.932130813598633,
14
+ "learning_rate": 4.600000000000001e-06,
15
+ "loss": 3.5703,
16
  "step": 25
17
  },
18
  {
19
  "epoch": 0.8064516129032258,
20
+ "grad_norm": 21.00741958618164,
21
+ "learning_rate": 9.600000000000001e-06,
22
+ "loss": 3.4342,
23
  "step": 50
24
  },
25
  {
26
  "epoch": 0.8064516129032258,
27
+ "eval_cer": 275.1465944970681,
28
+ "eval_loss": 4.133521556854248,
29
+ "eval_runtime": 108.8146,
30
+ "eval_samples_per_second": 0.919,
31
+ "eval_steps_per_second": 0.119,
32
  "step": 50
33
  },
34
  {
35
  "epoch": 1.2096774193548387,
36
+ "grad_norm": 21.135292053222656,
37
+ "learning_rate": 8.533333333333335e-06,
38
+ "loss": 3.3497,
39
  "step": 75
40
  },
41
  {
42
  "epoch": 1.6129032258064515,
43
+ "grad_norm": 21.045244216918945,
44
+ "learning_rate": 6.866666666666667e-06,
45
+ "loss": 3.0912,
46
  "step": 100
47
  },
48
  {
49
  "epoch": 1.6129032258064515,
50
+ "eval_cer": 265.17816869643667,
51
+ "eval_loss": 4.106583595275879,
52
+ "eval_runtime": 97.0216,
53
+ "eval_samples_per_second": 1.031,
54
+ "eval_steps_per_second": 0.134,
55
  "step": 100
56
  },
57
  {
58
+ "epoch": 2.0161290322580645,
59
+ "grad_norm": 20.702259063720703,
60
+ "learning_rate": 5.2e-06,
61
+ "loss": 3.1659,
62
+ "step": 125
63
+ },
64
+ {
65
+ "epoch": 2.4193548387096775,
66
+ "grad_norm": 26.67952537536621,
67
+ "learning_rate": 3.5333333333333335e-06,
68
+ "loss": 2.7991,
69
+ "step": 150
70
+ },
71
+ {
72
+ "epoch": 2.4193548387096775,
73
+ "eval_cer": 318.1326116373478,
74
+ "eval_loss": 4.060230255126953,
75
+ "eval_runtime": 102.4275,
76
+ "eval_samples_per_second": 0.976,
77
+ "eval_steps_per_second": 0.127,
78
+ "step": 150
79
+ },
80
+ {
81
+ "epoch": 2.8225806451612905,
82
+ "grad_norm": 24.625123977661133,
83
+ "learning_rate": 1.8666666666666669e-06,
84
+ "loss": 2.8228,
85
+ "step": 175
86
+ },
87
+ {
88
+ "epoch": 3.225806451612903,
89
+ "grad_norm": 17.782535552978516,
90
+ "learning_rate": 2.0000000000000002e-07,
91
+ "loss": 2.6758,
92
+ "step": 200
93
+ },
94
+ {
95
+ "epoch": 3.225806451612903,
96
+ "eval_cer": 736.0396932792061,
97
+ "eval_loss": 4.034571170806885,
98
+ "eval_runtime": 123.6186,
99
+ "eval_samples_per_second": 0.809,
100
+ "eval_steps_per_second": 0.105,
101
+ "step": 200
102
+ },
103
+ {
104
+ "epoch": 3.225806451612903,
105
+ "step": 200,
106
+ "total_flos": 1.2824839544832e+18,
107
+ "train_loss": 3.1136483764648437,
108
+ "train_runtime": 2250.2712,
109
+ "train_samples_per_second": 1.422,
110
+ "train_steps_per_second": 0.089
111
  }
112
  ],
113
  "logging_steps": 25,
114
+ "max_steps": 200,
115
  "num_input_tokens_seen": 0,
116
+ "num_train_epochs": 4,
117
  "save_steps": 50,
118
  "stateful_callbacks": {
119
  "TrainerControl": {
 
127
  "attributes": {}
128
  }
129
  },
130
+ "total_flos": 1.2824839544832e+18,
131
  "train_batch_size": 16,
132
  "trial_name": null,
133
  "trial_params": null