luisotorres
commited on
Commit
•
f282230
1
Parent(s):
1b9e91b
Update README.md
Browse files
README.md
CHANGED
@@ -34,6 +34,25 @@ This model is a specialized adaptation of the <b>facebook/bart-large-xsum</b>, f
|
|
34 |
## Development
|
35 |
- Kaggle Notebook: [Text Summarization with Large Language Models](https://www.kaggle.com/code/lusfernandotorres/text-summarization-with-large-language-models)
|
36 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
37 |
## Usage
|
38 |
|
39 |
```python
|
|
|
34 |
## Development
|
35 |
- Kaggle Notebook: [Text Summarization with Large Language Models](https://www.kaggle.com/code/lusfernandotorres/text-summarization-with-large-language-models)
|
36 |
|
37 |
+
## Training Parameters
|
38 |
+
```python
|
39 |
+
evaluation_strategy = "epoch",
|
40 |
+
save_strategy = 'epoch',
|
41 |
+
load_best_model_at_end = True,
|
42 |
+
metric_for_best_model = 'eval_loss',
|
43 |
+
seed = 42,
|
44 |
+
learning_rate=2e-5,
|
45 |
+
per_device_train_batch_size=4,
|
46 |
+
per_device_eval_batch_size=4,
|
47 |
+
gradient_accumulation_steps=2,
|
48 |
+
weight_decay=0.01,
|
49 |
+
save_total_limit=2,
|
50 |
+
num_train_epochs=4,
|
51 |
+
predict_with_generate=True,
|
52 |
+
fp16=True,
|
53 |
+
report_to="none"
|
54 |
+
```
|
55 |
+
|
56 |
## Usage
|
57 |
|
58 |
```python
|