bogdancazan
commited on
Commit
•
4bba065
1
Parent(s):
5d8eb37
Create README.md
Browse files
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
training_args = TrainingArguments(
|
2 |
+
output_dir='bart-base-newsela-biendata-with-domain-adaptation',
|
3 |
+
num_train_epochs=20,
|
4 |
+
warmup_steps=250,
|
5 |
+
per_device_train_batch_size=BATCH_SIZE,
|
6 |
+
weight_decay=0.01,
|
7 |
+
learning_rate=2e-4,
|
8 |
+
fp16=True,
|
9 |
+
optim="adafactor",
|
10 |
+
)
|
11 |
+
|
12 |
+
Step Training Loss
|
13 |
+
500 599.802100
|
14 |
+
1000 367.138000
|
15 |
+
1500 8.558800
|
16 |
+
2000 2.705000
|
17 |
+
TrainOutput(global_step=2320, training_loss=211.1473583352977, metrics={'train_runtime': 976.5416, 'train_samples_per_second': 303.807, 'train_steps_per_second': 2.376, 'total_flos': 0.0, 'train_loss': 211.1473583352977, 'epoch': 20.0})
|