jun-han commited on
Commit
870b37b
1 Parent(s): e133d55

Training checkpoint

Browse files
Files changed (2) hide show
  1. README.md +7 -5
  2. trainer_state.json +10 -10
README.md CHANGED
@@ -1,21 +1,23 @@
1
  ---
 
 
2
  license: apache-2.0
3
- base_model: jun-han/whisper-small-zh
4
  tags:
5
  - generated_from_trainer
6
  datasets:
7
- - common_voice_16_1
8
  model-index:
9
- - name: whisper-small
10
  results: []
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
  should probably proofread and complete it, then remove this comment. -->
15
 
16
- # whisper-small
17
 
18
- This model is a fine-tuned version of [jun-han/whisper-small-zh](https://huggingface.co/jun-han/whisper-small-zh) on the common_voice_16_1 dataset.
19
  It achieves the following results on the evaluation set:
20
  - Cer: 33.3994
21
  - Loss: 0.6020
 
1
  ---
2
+ language:
3
+ - zh
4
  license: apache-2.0
5
+ base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
+ - mozilla-foundation/common_voice_16_1
10
  model-index:
11
+ - name: Wisper-Small-zh_test
12
  results: []
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
+ # Wisper-Small-zh_test
19
 
20
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 16.1 dataset.
21
  It achieves the following results on the evaluation set:
22
  - Cer: 33.3994
23
  - Loss: 0.6020
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 33.39944765252322,
3
  "best_model_checkpoint": "/kaggle/working/whisper-small/checkpoint-1000",
4
- "epoch": 1.3245033112582782,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -307,13 +307,13 @@
307
  "step": 1000
308
  },
309
  {
310
- "epoch": 1.3245033112582782,
311
- "step": 1000,
312
- "total_flos": 4.65727933108224e+18,
313
- "train_loss": 2.47559251499176,
314
- "train_runtime": 12073.0146,
315
- "train_samples_per_second": 1.325,
316
- "train_steps_per_second": 0.083
317
  }
318
  ],
319
  "logging_steps": 25,
@@ -333,7 +333,7 @@
333
  "attributes": {}
334
  }
335
  },
336
- "total_flos": 4.65727933108224e+18,
337
  "train_batch_size": 16,
338
  "trial_name": null,
339
  "trial_params": null
 
1
  {
2
  "best_metric": 33.39944765252322,
3
  "best_model_checkpoint": "/kaggle/working/whisper-small/checkpoint-1000",
4
+ "epoch": 1.3258278145695364,
5
  "eval_steps": 500,
6
+ "global_step": 1001,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
307
  "step": 1000
308
  },
309
  {
310
+ "epoch": 1.3258278145695364,
311
+ "step": 1001,
312
+ "total_flos": 4.66193748381696e+18,
313
+ "train_loss": 0.0006697479780618246,
314
+ "train_runtime": 18.134,
315
+ "train_samples_per_second": 882.321,
316
+ "train_steps_per_second": 55.145
317
  }
318
  ],
319
  "logging_steps": 25,
 
333
  "attributes": {}
334
  }
335
  },
336
+ "total_flos": 4.66193748381696e+18,
337
  "train_batch_size": 16,
338
  "trial_name": null,
339
  "trial_params": null