Update README.md
Browse files
README.md
CHANGED
@@ -28,6 +28,40 @@ We present the dev results on SQuAD 1.1/2.0 and MNLI tasks.
|
|
28 |
| **DeBERTa-v3-base** | 93.9/88.4 | 88.4/85.4 | 90.5 |
|
29 |
| DeBERTa-v3-base+SiFT | -/- | -/- | **91.0** |
|
30 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
31 |
|
32 |
### Citation
|
33 |
|
|
|
28 |
| **DeBERTa-v3-base** | 93.9/88.4 | 88.4/85.4 | 90.5 |
|
29 |
| DeBERTa-v3-base+SiFT | -/- | -/- | **91.0** |
|
30 |
|
31 |
+
#### Fine-tuning with HF transformers
|
32 |
+
|
33 |
+
```bash
|
34 |
+
#!/bin/bash
|
35 |
+
|
36 |
+
cd transformers/examples/pytorch/text-classification/
|
37 |
+
|
38 |
+
pip install datasets
|
39 |
+
export TASK_NAME=mnli
|
40 |
+
|
41 |
+
output_dir="ds_results"
|
42 |
+
|
43 |
+
num_gpus=8
|
44 |
+
|
45 |
+
batch_size=8
|
46 |
+
|
47 |
+
python -m torch.distributed.launch --nproc_per_node=${num_gpus} \
|
48 |
+
run_glue.py \
|
49 |
+
--model_name_or_path microsoft/deberta-v3-small \
|
50 |
+
--task_name $TASK_NAME \
|
51 |
+
--do_train \
|
52 |
+
--do_eval \
|
53 |
+
--evaluation_strategy steps \
|
54 |
+
--max_seq_length 256 \
|
55 |
+
--warmup_steps 1000 \
|
56 |
+
--per_device_train_batch_size ${batch_size} \
|
57 |
+
--learning_rate 2.5e-5 \
|
58 |
+
--num_train_epochs 3 \
|
59 |
+
--output_dir $output_dir \
|
60 |
+
--overwrite_output_dir \
|
61 |
+
--logging_steps 1000 \
|
62 |
+
--logging_dir $output_dir
|
63 |
+
|
64 |
+
```
|
65 |
|
66 |
### Citation
|
67 |
|