Update README.md
Browse files
README.md
CHANGED
|
@@ -28,6 +28,40 @@ We present the dev results on SQuAD 1.1/2.0 and MNLI tasks.
|
|
| 28 |
| **DeBERTa-v3-base** | 93.9/88.4 | 88.4/85.4 | 90.5 |
|
| 29 |
| DeBERTa-v3-base+SiFT | -/- | -/- | **91.0** |
|
| 30 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
|
| 32 |
### Citation
|
| 33 |
|
|
|
|
| 28 |
| **DeBERTa-v3-base** | 93.9/88.4 | 88.4/85.4 | 90.5 |
|
| 29 |
| DeBERTa-v3-base+SiFT | -/- | -/- | **91.0** |
|
| 30 |
|
| 31 |
+
#### Fine-tuning with HF transformers
|
| 32 |
+
|
| 33 |
+
```bash
|
| 34 |
+
#!/bin/bash
|
| 35 |
+
|
| 36 |
+
cd transformers/examples/pytorch/text-classification/
|
| 37 |
+
|
| 38 |
+
pip install datasets
|
| 39 |
+
export TASK_NAME=mnli
|
| 40 |
+
|
| 41 |
+
output_dir="ds_results"
|
| 42 |
+
|
| 43 |
+
num_gpus=8
|
| 44 |
+
|
| 45 |
+
batch_size=8
|
| 46 |
+
|
| 47 |
+
python -m torch.distributed.launch --nproc_per_node=${num_gpus} \
|
| 48 |
+
run_glue.py \
|
| 49 |
+
--model_name_or_path microsoft/deberta-v3-small \
|
| 50 |
+
--task_name $TASK_NAME \
|
| 51 |
+
--do_train \
|
| 52 |
+
--do_eval \
|
| 53 |
+
--evaluation_strategy steps \
|
| 54 |
+
--max_seq_length 256 \
|
| 55 |
+
--warmup_steps 1000 \
|
| 56 |
+
--per_device_train_batch_size ${batch_size} \
|
| 57 |
+
--learning_rate 2.5e-5 \
|
| 58 |
+
--num_train_epochs 3 \
|
| 59 |
+
--output_dir $output_dir \
|
| 60 |
+
--overwrite_output_dir \
|
| 61 |
+
--logging_steps 1000 \
|
| 62 |
+
--logging_dir $output_dir
|
| 63 |
+
|
| 64 |
+
```
|
| 65 |
|
| 66 |
### Citation
|
| 67 |
|