Spaces:

flax-community
/

dalle-mini

Running

boris commited on Jul 15, 2021

Commit

63249ac

•

1 Parent(s): a30dbd3

feat: update scriptst

Files changed (2) hide show

seq2seq/do_big_run.sh CHANGED Viewed

@@ -1,16 +1,16 @@
 python run_seq2seq_flax.py \
 	--max_source_length 128 \
-	--train_file /data/CC12M/encoded-small-train.tsv \			# ignored for now in our script
-	--validation_file /data/CC12M/encoded-small-valid.tsv \		# ignored for now in our script
 	--output_dir output \
 	--per_device_train_batch_size 56 \
 	--per_device_eval_batch_size 56 \
 	--preprocessing_num_workers 80 \
-	--warmup_steps 125 \
 	--gradient_accumulation_steps 8 \
 	--do_train \
 	--do_eval \
 	--adafactor \
-	--num_train_epochs 10 \
 	--log_model \
-	--learning_rate 0.001

 python run_seq2seq_flax.py \
 	--max_source_length 128 \
+	--train_file /data/CC12M/encoded-small-train.tsv \
+	--validation_file /data/CC12M/encoded-small-valid.tsv \
 	--output_dir output \
 	--per_device_train_batch_size 56 \
 	--per_device_eval_batch_size 56 \
 	--preprocessing_num_workers 80 \
+	--warmup_steps 250 \
 	--gradient_accumulation_steps 8 \
 	--do_train \
 	--do_eval \
 	--adafactor \
+	--num_train_epochs 6 \
 	--log_model \
+	--learning_rate 0.005

seq2seq/do_small_run.sh CHANGED Viewed

@@ -1,7 +1,7 @@
 python run_seq2seq_flax.py \
 	--max_source_length 128 \
-	--train_file /data/CC12M/encoded-small-train.tsv \			# ignored for now in our script
-	--validation_file /data/CC12M/encoded-small-valid.tsv \		# ignored for now in our script
 	--output_dir output \
 	--per_device_train_batch_size 56 \
 	--per_device_eval_batch_size 56 \
@@ -13,4 +13,4 @@ python run_seq2seq_flax.py \
 	--adafactor \
 	--num_train_epochs 1 \
 	--max_train_samples 20000 \
-	--learning_rate 0.003

 python run_seq2seq_flax.py \
 	--max_source_length 128 \
+	--train_file /data/CC12M/encoded-small-train.tsv \
+	--validation_file /data/CC12M/encoded-small-valid.tsv \
 	--output_dir output \
 	--per_device_train_batch_size 56 \
 	--per_device_eval_batch_size 56 \
 	--adafactor \
 	--num_train_epochs 1 \
 	--max_train_samples 20000 \
+	--learning_rate 0.005