|
export HF_DATASETS_CACHE="/workspace/.cache/huggingface/datasets" |
|
|
|
python run_mlm.py \ |
|
--model_name_or_path Bingsu/my_mobilebert_untrained \ |
|
--train_file train.txt \ |
|
--validation_file val.txt \ |
|
--per_device_train_batch_size 16 \ |
|
--per_device_eval_batch_size 16 \ |
|
--gradient_accumulation_steps 2 \ |
|
--max_steps 1000000 \ |
|
--lr_scheduler_type cosine_with_restarts \ |
|
--warmup_ratio 0.05 \ |
|
--save_steps 5000 \ |
|
--save_total_limit 5 \ |
|
--logging_steps 5000 \ |
|
--fp16 \ |
|
--optim adamw_torch \ |
|
--do_train \ |
|
--do_eval \ |
|
--push_to_hub \ |
|
--hub_strategy checkpoint \ |
|
--output_dir mobilebert_ko \ |
|
--overwrite_output_dir |