jun-han commited on
Commit
1421e54
1 Parent(s): 870b37b

Training in progress, step 1001

Browse files
README.md CHANGED
@@ -8,19 +8,19 @@ tags:
8
  datasets:
9
  - mozilla-foundation/common_voice_16_1
10
  model-index:
11
- - name: Wisper-Small-zh_test
12
  results: []
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
- # Wisper-Small-zh_test
19
 
20
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 16.1 dataset.
21
  It achieves the following results on the evaluation set:
22
- - Cer: 33.3994
23
  - Loss: 0.6020
 
24
 
25
  ## Model description
26
 
@@ -51,10 +51,10 @@ The following hyperparameters were used during training:
51
 
52
  ### Training results
53
 
54
- | Training Loss | Epoch | Step | Cer | Validation Loss |
55
- |:-------------:|:------:|:----:|:--------:|:---------------:|
56
- | 2.9388 | 0.6623 | 500 | 102.7090 | 2.9818 |
57
- | 0.5492 | 1.3245 | 1000 | 33.3994 | 0.6020 |
58
 
59
 
60
  ### Framework versions
 
8
  datasets:
9
  - mozilla-foundation/common_voice_16_1
10
  model-index:
11
+ - name: Wisper-Small-zh
12
  results: []
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
+ # Wisper-Small-zh
19
 
20
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 16.1 dataset.
21
  It achieves the following results on the evaluation set:
 
22
  - Loss: 0.6020
23
+ - Cer: 33.3994
24
 
25
  ## Model description
26
 
 
51
 
52
  ### Training results
53
 
54
+ | Training Loss | Epoch | Step | Validation Loss | Cer |
55
+ |:-------------:|:------:|:----:|:---------------:|:--------:|
56
+ | 2.9388 | 0.6623 | 500 | 2.9818 | 102.7090 |
57
+ | 0.5492 | 1.3245 | 1000 | 0.6020 | 33.3994 |
58
 
59
 
60
  ### Framework versions
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:524602c80ff594d2d365501dce64a850c7efd7f01df64cca55fb5cb68a859cef
3
  size 974076256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15e6e52b8a9be9bce4160afe9dd2a674cae1eee39a41915243877ba475553089
3
  size 974076256
runs/Aug03_01-56-24_da41efab0859/events.out.tfevents.1722650475.da41efab0859.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a14111bca9897aeafe3f80329922edaa1e4033d18a5ee3a3909aacebb659b4f
3
+ size 7005
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 33.39944765252322,
3
  "best_model_checkpoint": "/kaggle/working/whisper-small/checkpoint-1000",
4
- "epoch": 1.3258278145695364,
5
  "eval_steps": 500,
6
- "global_step": 1001,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -307,13 +307,13 @@
307
  "step": 1000
308
  },
309
  {
310
- "epoch": 1.3258278145695364,
311
- "step": 1001,
312
- "total_flos": 4.66193748381696e+18,
313
- "train_loss": 0.0006697479780618246,
314
- "train_runtime": 18.134,
315
- "train_samples_per_second": 882.321,
316
- "train_steps_per_second": 55.145
317
  }
318
  ],
319
  "logging_steps": 25,
@@ -333,7 +333,7 @@
333
  "attributes": {}
334
  }
335
  },
336
- "total_flos": 4.66193748381696e+18,
337
  "train_batch_size": 16,
338
  "trial_name": null,
339
  "trial_params": null
 
1
  {
2
  "best_metric": 33.39944765252322,
3
  "best_model_checkpoint": "/kaggle/working/whisper-small/checkpoint-1000",
4
+ "epoch": 1.3245033112582782,
5
  "eval_steps": 500,
6
+ "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
307
  "step": 1000
308
  },
309
  {
310
+ "epoch": 1.3245033112582782,
311
+ "step": 1000,
312
+ "total_flos": 4.65727933108224e+18,
313
+ "train_loss": 2.47559251499176,
314
+ "train_runtime": 12073.0146,
315
+ "train_samples_per_second": 1.325,
316
+ "train_steps_per_second": 0.083
317
  }
318
  ],
319
  "logging_steps": 25,
 
333
  "attributes": {}
334
  }
335
  },
336
+ "total_flos": 4.65727933108224e+18,
337
  "train_batch_size": 16,
338
  "trial_name": null,
339
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4cf2b44061539b74e60a14e18c8ca6fb6cec2a6c1d018d5170eccb871bc1589
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb88f0fe789f473701fc1eb849990b085024dce0c930792f1b319c440ea3de12
3
  size 5304