File size: 485 Bytes
d816f2e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
python run_summarization_flax.py \
	--output_dir ./mt5-base-qgen \
	--model_name_or_path google/mt5-base \
	--tokenizer_name google/mt5-base \
    --train_file qgen_training_data.csv \
    --text_column context \
    --summary_column question \
	--do_train 
	--num_train_epochs 3 \
	--learning_rate 5e-5 --warmup_steps 300 \
	--per_device_train_batch_size 2 \
	--per_device_eval_batch_size 2 \
	--overwrite_output_dir \
	--max_source_length 1024 --max_target_length 64 \
	--push_to_hub