with open("vocab.txt", "w") as f: for token in tokenizer.get_vocab().keys(): f.write(token + "\n")