Spaces:
Building
Building
File size: 334 Bytes
1914537 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
from app.bpe_tokenizer import BPETokenizer
def main():
# Instantiate the BPETokenizer
tokenizer = BPETokenizer()
# Define the frequency threshold
threshold = 10000
# Perform the one-time update of the BPE model
tokenizer.update_bpe_model_from_frequencies(threshold)
if __name__ == "__main__":
main()
|