Spaces:
Runtime error
Runtime error
| expdir=$1 # EXPDIR | |
| num_operations=${2:-32000} | |
| #`dirname $0`/env.sh | |
| SUBWORD_NMT_DIR="subword-nmt" | |
| data_dir="$expdir/data" | |
| train_file=$data_dir/train | |
| # num_operations=32000 | |
| echo Input file: $train_file | |
| mkdir -p $expdir/vocab | |
| echo "learning source BPE" | |
| python $SUBWORD_NMT_DIR/subword_nmt/learn_bpe.py \ | |
| --input $train_file.SRC \ | |
| -s $num_operations \ | |
| -o $expdir/vocab/bpe_codes.32k.SRC\ | |
| --num-workers -1 | |
| echo "learning target BPE" | |
| python $SUBWORD_NMT_DIR/subword_nmt/learn_bpe.py \ | |
| --input $train_file.TGT \ | |
| -s $num_operations \ | |
| -o $expdir/vocab/bpe_codes.32k.TGT\ | |
| --num-workers -1 | |
| echo "computing SRC vocab" | |
| python $SUBWORD_NMT_DIR/subword_nmt/apply_bpe.py \ | |
| -c $expdir/vocab/bpe_codes.32k.SRC \ | |
| --num-workers -1 \ | |
| -i $train_file.SRC | \ | |
| python $SUBWORD_NMT_DIR/subword_nmt/get_vocab.py \ | |
| > $expdir/vocab/vocab.tmp.SRC | |
| python scripts/clean_vocab.py $expdir/vocab/vocab.tmp.SRC $expdir/vocab/vocab.SRC | |
| rm $expdir/vocab/vocab.tmp.SRC | |
| echo "computing TGT vocab" | |
| python $SUBWORD_NMT_DIR/subword_nmt/apply_bpe.py \ | |
| -c $expdir/vocab/bpe_codes.32k.TGT \ | |
| --num-workers -1 \ | |
| -i $train_file.TGT | \ | |
| python $SUBWORD_NMT_DIR/subword_nmt/get_vocab.py \ | |
| > $expdir/vocab/vocab.tmp.TGT | |
| python scripts/clean_vocab.py $expdir/vocab/vocab.tmp.TGT $expdir/vocab/vocab.TGT | |
| rm $expdir/vocab/vocab.tmp.TGT | |