Merge branch 'main' of https://huggingface.co/jamarju/roberta-large-bne-squad-2.0-es into main
Browse files
README.md
CHANGED
@@ -37,5 +37,20 @@ Results:
|
|
37 |
Training script:
|
38 |
|
39 |
```
|
40 |
-
python -m torch.distributed.launch --nproc_per_node=3 ./run_qa.py
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
41 |
|
|
|
37 |
Training script:
|
38 |
|
39 |
```
|
40 |
+
python -m torch.distributed.launch --nproc_per_node=3 ./run_qa.py \
|
41 |
+
--model_name_or_path BSC-TeMU/roberta-large-bne \
|
42 |
+
--dataset_name squad_es \
|
43 |
+
--dataset_config_name v2.0.0 \
|
44 |
+
--do_train \
|
45 |
+
--do_eval \
|
46 |
+
--learning_rate 3e-5 \
|
47 |
+
--num_train_epochs 4 \
|
48 |
+
--max_seq_length 384 \
|
49 |
+
--doc_stride 128 \
|
50 |
+
--output_dir ./models/roberta-large-bne-finetuned-squad-es/ \
|
51 |
+
--per_device_eval_batch_size=24 \
|
52 |
+
--per_device_train_batch_size=12 \
|
53 |
+
--version_2_with_negative \
|
54 |
+
--ddp_find_unused_parameters=False \
|
55 |
+
```
|
56 |
|