GAMA-IT

Running on Zero

bug fix

fa57c60 9 months ago

1.02 kB

	if ! [ -f ./dev.txt ]; then
	echo "Downloading CONLL2003 dev dataset...."
	curl -L -o ./dev.txt 'https://github.com/davidsbatista/NER-datasets/raw/master/CONLL2003/valid.txt'
	fi

	if ! [ -f ./test.txt ]; then
	echo "Downloading CONLL2003 test dataset...."
	curl -L -o ./test.txt 'https://github.com/davidsbatista/NER-datasets/raw/master/CONLL2003/test.txt'
	fi

	if ! [ -f ./train.txt ]; then
	echo "Downloading CONLL2003 train dataset...."
	curl -L -o ./train.txt 'https://github.com/davidsbatista/NER-datasets/raw/master/CONLL2003/train.txt'
	fi

	export MAX_LENGTH=200
	export BERT_MODEL=bert-base-uncased
	export OUTPUT_DIR=chunker-model
	export BATCH_SIZE=32
	export NUM_EPOCHS=3
	export SAVE_STEPS=750
	export SEED=1

	python3 run_ner.py \
	--task_type Chunk \
	--data_dir . \
	--model_name_or_path $BERT_MODEL \
	--output_dir $OUTPUT_DIR \
	--max_seq_length $MAX_LENGTH \
	--num_train_epochs $NUM_EPOCHS \
	--per_gpu_train_batch_size $BATCH_SIZE \
	--save_steps $SAVE_STEPS \
	--seed $SEED \
	--do_train \
	--do_eval \
	--do_predict