Model save

Browse files

Files changed (8) hide show

config.json +1 -1
pytorch_model.bin +1 -1
run-initial.sh +31 -0
run.sh +6 -4
runs/Feb02_08-46-53_job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73/1643791725.3471384/events.out.tfevents.1643791725.job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73.544082.1 +3 -0
runs/Feb02_08-46-53_job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73/events.out.tfevents.1643791725.job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73.544082.0 +3 -0
special_tokens_map.json +1 -1
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "facebook/wav2vec2-xls-r-1b",
   "activation_dropout": 0.0,
   "adapter_kernel_size": 3,
   "adapter_stride": 2,

 {
+  "_name_or_path": "./checkpoint-10500",
   "activation_dropout": 0.0,
   "adapter_kernel_size": 3,
   "adapter_stride": 2,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:518f88583acc237a9484294c5836ea827f4ca2979ddb5082958fd5251aec63e0
 size 3850522801

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ca4950372ef0c8087c4959170606fbc72ce4b0e560420df5686b99acb012d8c
 size 3850522801

run-initial.sh ADDED Viewed

	@@ -0,0 +1,31 @@

+python run_speech_recognition_ctc.py \
+	--dataset_name="common_voice" \
+	--model_name_or_path="facebook/wav2vec2-xls-r-1b" \
+	--dataset_config_name="tr" \
+	--output_dir="./" \
+	--overwrite_output_dir \
+	--num_train_epochs="100" \
+	--per_device_train_batch_size="32" \
+	--gradient_accumulation_steps="1" \
+	--learning_rate="5e-4" \
+	--warmup_steps="500" \
+	--evaluation_strategy="steps" \
+	--text_column_name="sentence" \
+	--save_steps="500" \
+	--eval_steps="500" \
+	--logging_steps="1" \
+	--layerdrop="0.0" \
+	--eval_metrics wer cer \
+	--save_total_limit="1" \
+	--mask_time_prob="0.3" \
+	--mask_time_length="10" \
+	--mask_feature_prob="0.1" \
+	--mask_feature_length="64" \
+	--chars_to_ignore , ? . ! - \; \: \" “ % ‘ ” � \
+	--fp16 \
+	--group_by_length \
+	--push_to_hub \
+	--do_train --do_eval \
+	--gradient_checkpointing \
+	--report_to tensorboard \
+	--use_auth_token

run.sh CHANGED Viewed

@@ -1,14 +1,16 @@
 python run_speech_recognition_ctc.py \
 	--dataset_name="common_voice" \
-	--model_name_or_path="facebook/wav2vec2-xls-r-1b" \
 	--dataset_config_name="tr" \
 	--output_dir="./" \
 	--overwrite_output_dir \
-	--num_train_epochs="100" \
 	--per_device_train_batch_size="32" \
 	--gradient_accumulation_steps="1" \
-	--learning_rate="5e-4" \
-	--warmup_steps="500" \
 	--evaluation_strategy="steps" \
 	--text_column_name="sentence" \
 	--save_steps="500" \

 python run_speech_recognition_ctc.py \
 	--dataset_name="common_voice" \
+	--model_name_or_path="./checkpoint-10500" \
 	--dataset_config_name="tr" \
 	--output_dir="./" \
 	--overwrite_output_dir \
+	--num_train_epochs="5" \
 	--per_device_train_batch_size="32" \
 	--gradient_accumulation_steps="1" \
+	--learning_rate="2e-4" \
+	--adam_beta1="0.999" \
+	--adam_beta2="0.9999" \
+	--warmup_steps="0" \
 	--evaluation_strategy="steps" \
 	--text_column_name="sentence" \
 	--save_steps="500" \

runs/Feb02_08-46-53_job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73/1643791725.3471384/events.out.tfevents.1643791725.job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73.544082.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6b29b1ae9c451e8eab2966f428b2e5c2a227492eeaaeca60368ca3af04965fc
+size 4747

runs/Feb02_08-46-53_job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73/events.out.tfevents.1643791725.job-98a7eb1d-c6a6-4e4b-936b-3898557b5e73.544082.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1504af2a3148769c7c04d8660bb4d24066021036eb86bfa3a930478875ec83b
+size 5009

special_tokens_map.json CHANGED Viewed

@@ -1 +1 @@

- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}

+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:322e8ae9f01b347bb69390fb3c42730bcf5c1f1587067d51096c85da5f6d9059
 size 2991

 version https://git-lfs.github.com/spec/v1
+oid sha256:c8dee437aaa47d9cbc005e3b550051db80d4617488fe4076bffb7e191ee8a9d6
 size 2991