sanchit-gandhi's picture
add training scripts
4b48e5c
raw
history blame contribute delete
950 Bytes
deepspeed run_audio_classification.py \
--deepspeed ds_config.json \
--model_name_or_path openai/whisper-medium \
--dataset_name google/xtreme_s \
--dataset_config_name fleurs.all \
--output_dir ./ \
--overwrite_output_dir \
--remove_unused_columns False \
--do_train \
--do_eval \
--fp16 \
--learning_rate 3e-5 \
--max_length_seconds 30 \
--label_column_name lang_id \
--attention_mask False \
--warmup_ratio 0.1 \
--num_train_epochs 3 \
--per_device_train_batch_size 16 \
--gradient_accumulation_steps 2 \
--gradient_checkpointing True \
--per_device_eval_batch_size 32 \
--dataloader_num_workers 8 \
--logging_strategy steps \
--logging_steps 25 \
--evaluation_strategy epoch \
--save_strategy epoch \
--load_best_model_at_end True \
--metric_for_best_model accuracy \
--seed 0 \
--freeze_feature_encoder False \
--push_to_hub